export ASCEND_RT_VISIBLE_DEVICES=0
#export ASCEND_RT_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
torchrun  --nnodes=1  --nproc_per_node=1 --master_port=29500 s1_train.py 
